@book{breiman2017classification,
  title={Classification and regression trees},
  author={Breiman, Leo},
  year={2017},
  publisher={Routledge}
}

@article{chen2017learning,
  title={Learning discrete Bayesian networks from continuous data},
  author={Chen, Yi-Chun and Wheeler, Tim A and Kochenderfer, Mykel J},
  journal={Journal of Artificial Intelligence Research},
  volume={59},
  pages={103--132},
  year={2017}
}

@article{park2018data,
  title={Data synthesis based on generative adversarial networks},
  author={Park, Noseong and Mohammadi, Mahmoud and Gorde, Kshitij and Jajodia, Sushil and Park, Hongkyu and Kim, Youngmin},
  journal={arXiv preprint arXiv:1806.03384},
  year={2018}
}

@article{rosenbaum1983central,
  title={The central role of the propensity score in observational studies for causal effects},
  author={Rosenbaum, Paul R and Rubin, Donald B},
  journal={Biometrika},
  volume={70},
  number={1},
  pages={41--55},
  year={1983},
  publisher={Oxford University Press}
}

@article{drechsler2010sampling,
  title={Sampling with synthesis: A new approach for releasing public use census microdata},
  author={Drechsler, J{\"o}rg and Reiter, Jerome P},
  journal={Journal of the American Statistical Association},
  volume={105},
  number={492},
  pages={1347--1357},
  year={2010},
  publisher={Taylor \& Francis}
}

@article{snoke2018general,
  title={General and specific utility measures for synthetic data},
  author={Snoke, Joshua and Raab, Gillian M and Nowok, Beata and Dibben, Chris and Slavkovic, Aleksandra},
  journal={Journal of the Royal Statistical Society Series A: Statistics in Society},
  volume={181},
  number={3},
  pages={663--688},
  year={2018},
  publisher={Oxford University Press}
}

@inproceedings{
    francis_wagner_yyyy,
    title={On the widespread failures of measuring data anonymity vulnerabilities},
    author={Francis Paul and Wagner, David},
    booktitle={In Proceedings of Proceedings on Privacy Enhancing Technologies},
    year={YYYY},
    pages={13 pages},
    doi={https://doi.org/XXXXXXX.XXXXXXX}
}

@article{caiola2010random,
  title={Random Forests for Generating Partially Synthetic, Categorical Data.},
  author={Caiola, Gregory and Reiter, Jerome P},
  journal={Trans. Data Priv.},
  volume={3},
  number={1},
  pages={27--42},
  year={2010},
  publisher={Citeseer}
}

@article{kenny2021use,
  title={The use of differential privacy for census data and its impact on redistricting: The case of the 2020 US Census},
  author={Kenny, Christopher T and Kuriwaki, Shiro and McCartan, Cory and Rosenman, Evan TR and Simko, Tyler and Imai, Kosuke},
  journal={Science advances},
  volume={7},
  number={41},
  pages={eabk3283},
  year={2021},
  publisher={American Association for the Advancement of Science}
}

@article{raab2021assessing,
  title={Assessing, visualizing and improving the utility of synthetic data},
  author={Raab, Gillian M and Nowok, Beata and Dibben, Chris},
  journal={arXiv preprint arXiv:2109.12717},
  year={2021}
}

@article{young2009using,
  title={Using Bayesian networks to create synthetic data},
  author={Young, Jim and Graham, Patrick and Penny, Richard},
  journal={Journal of Official Statistics},
  volume={25},
  number={4},
  pages={549--567},
  year={2009},
  publisher={Statistics Sweden (SCB)}
}


@inproceedings{
    patki2016synthetic,
    title={The Synthetic data vault},
    author={Patki, Neha and Wedge, Roy and Veeramachaneni, Kalyan},
    booktitle={IEEE International Conference on Data Science and Advanced Analytics (DSAA)},
    year={2016},
    pages={399-410},
    doi={10.1109/DSAA.2016.49},
    month={Oct}
}

@incollection{Bengio+chapter2007,
author = {Bengio, Yoshua and LeCun, Yann},
booktitle = {Large Scale Kernel Machines},
publisher = {MIT Press},
title = {Scaling Learning Algorithms Towards {AI}},
year = {2007}
}

@inproceedings{ping2017datasynthesizer,
  title={Datasynthesizer: Privacy-preserving synthetic datasets},
  author={Ping, Haoyue and Stoyanovich, Julia and Howe, Bill},
  booktitle={Proceedings of the 29th International Conference on Scientific and Statistical Database Management},
  pages={1--5},
  year={2017}
}

@misc{jordon2022synthetic,
      title={Synthetic Data -- what, why and how?}, 
      author={James Jordon and Lukasz Szpruch and Florimond Houssiau and Mirko Bottarelli and Giovanni Cherubin and Carsten Maple and Samuel N. Cohen and Adrian Weller},
      year={2022},
      eprint={2205.03257},
      archivePrefix={arXiv},
      primaryClass={cs.LG}
}

@article{Hinton06,
author = {Hinton, Geoffrey E. and Osindero, Simon and Teh, Yee Whye},
journal = {Neural Computation},
pages = {1527--1554},
title = {A Fast Learning Algorithm for Deep Belief Nets},
volume = {18},
year = {2006}
}

@book{goodfellow2016deep,
title={Deep learning},
author={Goodfellow, Ian and Bengio, Yoshua and Courville, Aaron and Bengio, Yoshua},
volume={1},
year={2016},
publisher={MIT Press}
}

@article{little2021generative,
  title={Generative adversarial networks for synthetic data generation: a comparative study},
  author={Little, Claire and Elliot, Mark and Allmendinger, Richard and Samani, Sahel Shariati},
  journal={arXiv preprint arXiv:2112.01925},
  year={2021}
}

@inproceedings{ctgan,
   title={Modeling Tabular data using Conditional GAN},
   author={Xu, Lei and Skoularidou, Maria and Cuesta-Infante, Alfredo and Veeramachaneni, Kalyan},
   booktitle={Advances in Neural Information Processing Systems},
   year={2019}
}

@article{hu2021multiple,
  title={Multiple Imputation and Synthetic Data Generation with NPBayesImputeCat.},
  author={Hu, Jingchen and Akande, Olanrewaju and Wang, Quanli},
  journal={R Journal},
  volume={13},
  number={2},
  year={2021}
}


@misc{raab2022utility,
      title={Utility and Disclosure Risk for Differentially Private Synthetic Categorical Data}, 
      author={Gillian M Raab},
      year={2022},
      eprint={2206.01362},
      archivePrefix={arXiv},
      primaryClass={stat.AP}
}

@article{raab2017guidelines,
  title={Guidelines for producing useful synthetic data},
  author={Raab, Gillian M and Nowok, Beata and Dibben, Chris},
  journal={arXiv preprint arXiv:1712.04078},
  year={2017}
}


@misc{brown2023fast,
      title={Fast, Sample-Efficient, Affine-Invariant Private Mean and Covariance Estimation for Subgaussian Distributions}, 
      author={Gavin Brown and Samuel B. Hopkins and Adam Smith},
      year={2023},
      eprint={2301.12250},
      archivePrefix={arXiv},
      primaryClass={cs.LG}
}

@misc{alabi2023privately,
      title={Privately Estimating a Gaussian: Efficient, Robust and Optimal}, 
      author={Daniel Alabi and Pravesh K. Kothari and Pranay Tankala and Prayaag Venkat and Fred Zhang},
      year={2023},
      eprint={2212.08018},
      archivePrefix={arXiv},
      primaryClass={cs.DS}
}

@inproceedings{little2022comparing,
  title={Comparing the Utility and Disclosure Risk of Synthetic Data with Samples of Microdata},
  author={Little, Claire and Elliot, Mark and Allmendinger, Richard},
  booktitle={International Conference on Privacy in Statistical Databases},
  pages={234--249},
  year={2022},
  organization={Springer}
}

@article{dankar2021fake,
  title={Fake it till you make it: Guidelines for effective synthetic data generation},
  author={Dankar, Fida K and Ibrahim, Mahmoud},
  journal={Applied Sciences},
  volume={11},
  number={5},
  pages={21--58},
  year={2021},
  publisher={MDPI}
}

@article{rubin1993statistical,
  title={Statistical disclosure limitation},
  author={Rubin, Donald B},
  journal={Journal of official Statistics},
  volume={9},
  number={2},
  pages={461--468},
  year={1993}
}

@article{reiter2009estimating,
  title={Estimating risks of identification disclosure in partially synthetic data},
  author={Reiter, Jerome P and Mitra, Robin},
  journal={Journal of Privacy and Confidentiality},
  volume={1},
  number={1},
  year={2009}
}

@article{little1993statistical,
  title={Statistical analysis of masked data},
  author={Little, Roderick JA and others},
  journal={Journal of official statistics},
  volume={9},
  pages={407--407},
  year={1993},
  publisher={ALMQVIST \& WIKSELL INTERNATIONAL}
}

@article{reiter2010releasing,
  title={Releasing multiply-imputed synthetic data generated in two stages to protect confidentiality},
  author={Reiter, Jerome P and Drechsler, J{\"o}rg},
  journal={Statistica Sinica},
  pages={405--421},
  year={2010},
  publisher={JSTOR}
}

@article{taub2020impact,
  title={The Impact of Synthetic Data Generation on Data Utility with Application to the 1991 UK Samples of Anonymised Records.},
  author={Taub, Jennifer and Elliot, Mark and Sakshaug, Joseph W},
  journal={Trans. Data Priv.},
  volume={13},
  number={1},
  pages={1--23},
  year={2020}
}

@article{drechsler2009disclosure,
  title={Disclosure risk and data utility for partially synthetic data: An empirical study using the German IAB Establishment Survey},
  author={Drechsler, Jorg and Reiter, JP},
  journal={Journal of Official Statistics},
  volume={25},
  number={4},
  pages={589--603},
  year={2009},
  publisher={Statistics Sweden (SCB)}
}

@article{woo2009global,
  title={Global measures of data utility for microdata masked for disclosure limitation},
  author={Woo, Mi-Ja and Reiter, Jerome P and Oganian, Anna and Karr, Alan F},
  journal={Journal of Privacy and Confidentiality},
  volume={1},
  number={1},
  year={2009}
}

@article{karr2006framework,
  title={A framework for evaluating the utility of data altered to protect confidentiality},
  author={Karr, Alan F and Kohnen, Christine N and Oganian, Anna and Reiter, Jerome P and Sanil, Ashish P},
  journal={The American Statistician},
  volume={60},
  number={3},
  pages={224--232},
  year={2006},
  publisher={Taylor \& Francis}
}

@article{nowok2016synthpop,
  title={synthpop: Bespoke creation of synthetic data in R},
  author={Nowok, Beata and Raab, Gillian M and Dibben, Chris},
  journal={Journal of statistical software},
  volume={74},
  pages={1--26},
  year={2016}
}

@article{van2011mice,
  title={mice: Multivariate imputation by chained equations in R},
  author={Van Buuren, Stef and Groothuis-Oudshoorn, Karin},
  journal={Journal of statistical software},
  volume={45},
  pages={1--67},
  year={2011}
}

@article{reiter2005using,
  title={Using CART to generate partially synthetic public use microdata},
  author={Reiter, Jerome P},
  journal={Journal of official statistics},
  volume={21},
  number={3},
  pages={441},
  year={2005},
  publisher={Statistics Sweden (SCB)}
}

@article{liew1985data,
  title={A data distortion by probability distribution},
  author={Liew, Chong K and Choi, Uinam J and Liew, Chung J},
  journal={ACM Transactions on Database Systems (TODS)},
  volume={10},
  number={3},
  pages={395--411},
  year={1985},
  publisher={ACM New York, NY, USA}
}

@inproceedings{drechsler2022challenges,
  title={Challenges in measuring utility for fully synthetic data},
  author={Drechsler, J{\"o}rg},
  booktitle={International Conference on Privacy in Statistical Databases},
  pages={220--233},
  year={2022},
  organization={Springer}
}

@article{drechsler2011empirical,
  title={An empirical evaluation of easily implemented, nonparametric methods for generating synthetic datasets},
  author={Drechsler, J{\"o}rg and Reiter, Jerome P},
  journal={Computational Statistics \& Data Analysis},
  volume={55},
  number={12},
  pages={3232--3243},
  year={2011},
  publisher={Elsevier}
}

@article{drechsler202330,
  title={30 Years of Synthetic Data},
  author={Drechsler, Joerg and Haensch, Anna-Carolina},
  journal={arXiv preprint arXiv:2304.02107},
  year={2023}
}

@article{levy1992us,
  title={US earnings levels and earnings inequality: A review of recent trends and proposed explanations},
  author={Levy, Frank and Murnane, Richard J},
  journal={Journal of economic literature},
  volume={30},
  number={3},
  pages={1333--1381},
  year={1992},
  publisher={JSTOR}
}

@article{piketty2006evolution,
  title={The evolution of top incomes: a historical and international perspective},
  author={Piketty, Thomas and Saez, Emmanuel},
  journal={American economic review},
  volume={96},
  number={2},
  pages={200--205},
  year={2006},
  publisher={American Economic Association}
}

@article{sweeney2002k,
  title={k-anonymity: A model for protecting privacy},
  author={Sweeney, Latanya},
  journal={International journal of uncertainty, fuzziness and knowledge-based systems},
  volume={10},
  number={05},
  pages={557--570},
  year={2002},
  publisher={World Scientific}
}

@article{machanavajjhala2007diversity,
  title={l-diversity: Privacy beyond k-anonymity},
  author={Machanavajjhala, Ashwin and Kifer, Daniel and Gehrke, Johannes and Venkitasubramaniam, Muthuramakrishnan},
  journal={ACM Transactions on Knowledge Discovery from Data (TKDD)},
  volume={1},
  number={1},
  pages={3--es},
  year={2007},
  publisher={ACM New York, NY, USA}
}

@inproceedings{li2006t,
  title={t-closeness: Privacy beyond k-anonymity and l-diversity},
  author={Li, Ninghui and Li, Tiancheng and Venkatasubramanian, Suresh},
  booktitle={2007 IEEE 23rd international conference on data engineering},
  pages={106--115},
  year={2006},
  organization={IEEE}
}

@article{duncan2004database,
  title={Database security and confidentiality: examining disclosure risk vs. data utility through the RU confidentiality map},
  author={Duncan, George T and Keller-McNulty, Sallie A and Stokes, S Lynne},
  journal={Los Alamos National Laboratory, NM: National Institute for Statistical Sciences},
  year={2004}
}

@inproceedings{dwork2006calibrating,
  title={Calibrating noise to sensitivity in private data analysis},
  author={Dwork, Cynthia and McSherry, Frank and Nissim, Kobbi and Smith, Adam},
  booktitle={Theory of Cryptography: Third Theory of Cryptography Conference, TCC 2006, New York, NY, USA, March 4-7, 2006. Proceedings 3},
  pages={265--284},
  year={2006},
  organization={Springer}
}

@article{doove2014recursive,
  title={Recursive partitioning for missing data imputation in the presence of interaction effects},
  author={Doove, Lisa L and Van Buuren, Stef and Dusseldorp, Elise},
  journal={Computational statistics \& data analysis},
  volume={72},
  pages={92--104},
  year={2014},
  publisher={Elsevier}
}


@misc{synthcity,
  doi = {10.48550/ARXIV.2301.07573},
  url = {https://arxiv.org/abs/2301.07573},
  author = {Qian, Zhaozhi and Cebere, Bogdan-Constantin and van der Schaar, Mihaela},
  keywords = {Machine Learning (cs.LG), Artificial Intelligence (cs.AI), FOS: Computer and information sciences, FOS: Computer and information sciences},
  title = {Synthcity: facilitating innovative use cases of synthetic data in different data modalities},
  year = {2023},
  copyright = {Creative Commons Attribution 4.0 International}
}

@article{goodfellow2014generative,
  title={Generative adversarial nets},
  author={Goodfellow, Ian and Pouget-Abadie, Jean and Mirza, Mehdi and Xu, Bing and Warde-Farley, David and Ozair, Sherjil and Courville, Aaron and Bengio, Yoshua},
  journal={Advances in neural information processing systems},
  volume={27},
  year={2014}
}


@inproceedings{drechsler2010using,
  title={Using support vector machines for generating synthetic datasets},
  author={Drechsler, J{\"o}rg},
  booktitle={Privacy in Statistical Databases: UNESCO Chair in Data Privacy, International Conference, PSD 2010, Corfu, Greece, September 22-24, 2010. Proceedings},
  pages={148--161},
  year={2010},
  organization={Springer}
}

@article{beaulieu2019privacy,
  title={Privacy-preserving generative deep neural networks support clinical data sharing},
  author={Beaulieu-Jones, Brett K and Wu, Zhiwei Steven and Williams, Chris and Lee, Ran and Bhavnani, Sanjeev P and Byrd, James Brian and Greene, Casey S},
  journal={Circulation: Cardiovascular Quality and Outcomes},
  volume={12},
  number={7},
  pages={e005122},
  year={2019},
  publisher={Am Heart Assoc}
}

@article{neunhoeffer2020private,
  title={Private post-gan boosting},
  author={Neunhoeffer, Marcel and Wu, Zhiwei Steven and Dwork, Cynthia},
  journal={arXiv preprint arXiv:2007.11934},
  year={2021}
}

@article{volker2021anony,
  title={Anony mice d shareable data: Using mice to create and analyze multiply imputed synthetic datasets},
  author={Volker, Thom Benjamin and Vink, Gerko},
  journal={Psych},
  volume={3},
  number={4},
  pages={703--716},
  year={2021},
  publisher={MDPI}
}

@article{zhang2017privbayes,
  title={Privbayes: Private data release via bayesian networks},
  author={Zhang, Jun and Cormode, Graham and Procopiuc, Cecilia M and Srivastava, Divesh and Xiao, Xiaokui},
  journal={ACM Transactions on Database Systems (TODS)},
  volume={42},
  number={4},
  pages={1--41},
  year={2017},
  publisher={ACM New York, NY, USA}
}
